Iakarshu's workspace
Runs
45
Name
42 visualized
Created
Runtime
End Time
Hostname
ID
Notes
State
Updated
Tags
max_steps
_commit_hash
_name_or_path
add_cross_attention
architectures
chunk_size_feed_forward
config
d_ff
d_kv
d_model
decoder_start_token_id
dense_act_fn
diversity_penalty
do_sample
dropout_rate
early_stopping
encoder_no_repeat_ngram_size
eos_token_id
feed_forward_proj
id2label.0
id2label.1
initializer_factor
is_decoder
is_encoder_decoder
is_gated_act
label2id.LABEL_0
label2id.LABEL_1
layer_norm_epsilon
length_penalty
max_length
min_length
model_type
n_positions
no_repeat_ngram_size
num_beam_groups
num_beams
num_decoder_layers
num_heads
num_layers
num_return_sequences
output_attentions
output_hidden_states
6h 18m 10s
May 18 '23 21:06
-
01q773jf
-
Finished
May 18 '23 21:06
50000
fe6d9bf207cd3337512ca838a8b453f87a9178ef
t5-base
false
["T5ForConditionalGeneration"]
0
T5Config {
"_name_or_path": "t5-base",
"architectures": [
"T5ForConditionalGeneration"
],
"d_ff": 3072,
"d_kv": 64,
"d_model": 768,
"decoder_start_token_id": 0,
"dense_act_fn": "relu",
"dropout_rate": 0.1,
"eos_token_id": 1,
"feed_forward_proj": "relu",
"initializer_factor": 1.0,
"is_encoder_decoder": true,
"is_gated_act": false,
"layer_norm_epsilon": 1e-06,
"max_2d_position_embeddings": 1024,
"model_type": "t5",
"n_positions": 512,
"num_decoder_layers": 12,
"num_heads": 12,
"num_layers": 12,
"output_past": true,
"pad_token_id": 0,
"relative_attention_max_distance": 128,
"relative_attention_num_buckets": 32,
"task_specific_params": {
"summarization": {
"early_stopping": true,
"length_penalty": 2.0,
"max_length": 200,
"min_length": 30,
"no_repeat_ngram_size": 3,
"num_beams": 4,
"prefix": "summarize: "
},
"translation_en_to_de": {
"early_stopping": true,
"max_length": 300,
"num_beams": 4,
"prefix": "translate English to German: "
},
"translation_en_to_fr": {
"early_stopping": true,
"max_length": 300,
"num_beams": 4,
"prefix": "translate English to French: "
},
"translation_en_to_ro": {
"early_stopping": true,
"max_length": 300,
"num_beams": 4,
"prefix": "translate English to Romanian: "
}
},
"transformers_version": "4.27.4",
"use_cache": true,
"vit_model": "google/vit-base-patch16-224-in21k",
"vocab_size": 32128
}
3072
64
768
0
relu
0
false
0.1
false
0
1
relu
LABEL_0
LABEL_1
1
false
true
false
0
1
0.000001
1
20
0
t5
512
0
1
1
12
12
12
1
false
false
1m 12s
May 18 '23 14:47
-
671mqj35
-
Crashed
May 18 '23 14:47
50000
fe6d9bf207cd3337512ca838a8b453f87a9178ef
t5-base
false
["T5ForConditionalGeneration"]
0
T5Config {
"_name_or_path": "t5-base",
"architectures": [
"T5ForConditionalGeneration"
],
"d_ff": 3072,
"d_kv": 64,
"d_model": 768,
"decoder_start_token_id": 0,
"dense_act_fn": "relu",
"dropout_rate": 0.1,
"eos_token_id": 1,
"feed_forward_proj": "relu",
"initializer_factor": 1.0,
"is_encoder_decoder": true,
"is_gated_act": false,
"layer_norm_epsilon": 1e-06,
"max_2d_position_embeddings": 1024,
"model_type": "t5",
"n_positions": 512,
"num_decoder_layers": 12,
"num_heads": 12,
"num_layers": 12,
"output_past": true,
"pad_token_id": 0,
"relative_attention_max_distance": 128,
"relative_attention_num_buckets": 32,
"task_specific_params": {
"summarization": {
"early_stopping": true,
"length_penalty": 2.0,
"max_length": 200,
"min_length": 30,
"no_repeat_ngram_size": 3,
"num_beams": 4,
"prefix": "summarize: "
},
"translation_en_to_de": {
"early_stopping": true,
"max_length": 300,
"num_beams": 4,
"prefix": "translate English to German: "
},
"translation_en_to_fr": {
"early_stopping": true,
"max_length": 300,
"num_beams": 4,
"prefix": "translate English to French: "
},
"translation_en_to_ro": {
"early_stopping": true,
"max_length": 300,
"num_beams": 4,
"prefix": "translate English to Romanian: "
}
},
"transformers_version": "4.27.4",
"use_cache": true,
"vit_model": "google/vit-base-patch16-224-in21k",
"vocab_size": 32128
}
3072
64
768
0
relu
0
false
0.1
false
0
1
relu
LABEL_0
LABEL_1
1
false
true
false
0
1
0.000001
1
20
0
t5
512
0
1
1
12
12
12
1
false
false
34s
May 18 '23 14:44
-
yxa5q34c
-
Crashed
May 18 '23 14:44
-
fe6d9bf207cd3337512ca838a8b453f87a9178ef
t5-base
false
["T5ForConditionalGeneration"]
0
-
3072
64
768
0
relu
0
false
0.1
false
0
1
relu
LABEL_0
LABEL_1
1
false
true
false
0
1
0.000001
1
20
0
t5
512
0
1
1
12
12
12
1
false
false
1m
May 18 '23 14:44
-
iudxp6xf
-
Crashed
May 18 '23 14:44
-
fe6d9bf207cd3337512ca838a8b453f87a9178ef
t5-base
false
["T5ForConditionalGeneration"]
0
-
3072
64
768
0
relu
0
false
0.1
false
0
1
relu
LABEL_0
LABEL_1
1
false
true
false
0
1
0.000001
1
20
0
t5
512
0
1
1
12
12
12
1
false
false
3m 15s
May 18 '23 14:43
-
recfzyoc
-
Finished
May 18 '23 14:43
-
fe6d9bf207cd3337512ca838a8b453f87a9178ef
t5-base
false
["T5ForConditionalGeneration"]
0
-
3072
64
768
0
relu
0
false
0.1
false
0
1
relu
LABEL_0
LABEL_1
1
false
true
false
0
1
0.000001
1
20
0
t5
512
0
1
1
12
12
12
1
false
false
4m 26s
May 18 '23 14:39
-
9jqswtan
-
Finished
May 18 '23 14:39
50000
fe6d9bf207cd3337512ca838a8b453f87a9178ef
t5-base
false
["T5ForConditionalGeneration"]
0
T5Config {
"_name_or_path": "t5-base",
"architectures": [
"T5ForConditionalGeneration"
],
"d_ff": 3072,
"d_kv": 64,
"d_model": 768,
"decoder_start_token_id": 0,
"dense_act_fn": "relu",
"dropout_rate": 0.1,
"eos_token_id": 1,
"feed_forward_proj": "relu",
"initializer_factor": 1.0,
"is_encoder_decoder": true,
"is_gated_act": false,
"layer_norm_epsilon": 1e-06,
"max_2d_position_embeddings": 1024,
"model_type": "t5",
"n_positions": 512,
"num_decoder_layers": 12,
"num_heads": 12,
"num_layers": 12,
"output_past": true,
"pad_token_id": 0,
"relative_attention_max_distance": 128,
"relative_attention_num_buckets": 32,
"task_specific_params": {
"summarization": {
"early_stopping": true,
"length_penalty": 2.0,
"max_length": 200,
"min_length": 30,
"no_repeat_ngram_size": 3,
"num_beams": 4,
"prefix": "summarize: "
},
"translation_en_to_de": {
"early_stopping": true,
"max_length": 300,
"num_beams": 4,
"prefix": "translate English to German: "
},
"translation_en_to_fr": {
"early_stopping": true,
"max_length": 300,
"num_beams": 4,
"prefix": "translate English to French: "
},
"translation_en_to_ro": {
"early_stopping": true,
"max_length": 300,
"num_beams": 4,
"prefix": "translate English to Romanian: "
}
},
"transformers_version": "4.27.4",
"use_cache": true,
"vit_model": "google/vit-base-patch16-224-in21k",
"vocab_size": 32128
}
3072
64
768
0
relu
0
false
0.1
false
0
1
relu
LABEL_0
LABEL_1
1
false
true
false
0
1
0.000001
1
20
0
t5
512
0
1
1
12
12
12
1
false
false
6h 5m 45s
May 18 '23 15:27
-
ijpwksgx
-
Finished
May 18 '23 15:27
50000
fe6d9bf207cd3337512ca838a8b453f87a9178ef
t5-base
false
["T5ForConditionalGeneration"]
0
T5Config {
"_name_or_path": "t5-base",
"architectures": [
"T5ForConditionalGeneration"
],
"d_ff": 3072,
"d_kv": 64,
"d_model": 768,
"decoder_start_token_id": 0,
"dense_act_fn": "relu",
"dropout_rate": 0.1,
"eos_token_id": 1,
"feed_forward_proj": "relu",
"initializer_factor": 1.0,
"is_encoder_decoder": true,
"is_gated_act": false,
"layer_norm_epsilon": 1e-06,
"max_2d_position_embeddings": 1024,
"model_type": "t5",
"n_positions": 512,
"num_decoder_layers": 12,
"num_heads": 12,
"num_layers": 12,
"output_past": true,
"pad_token_id": 0,
"relative_attention_max_distance": 128,
"relative_attention_num_buckets": 32,
"task_specific_params": {
"summarization": {
"early_stopping": true,
"length_penalty": 2.0,
"max_length": 200,
"min_length": 30,
"no_repeat_ngram_size": 3,
"num_beams": 4,
"prefix": "summarize: "
},
"translation_en_to_de": {
"early_stopping": true,
"max_length": 300,
"num_beams": 4,
"prefix": "translate English to German: "
},
"translation_en_to_fr": {
"early_stopping": true,
"max_length": 300,
"num_beams": 4,
"prefix": "translate English to French: "
},
"translation_en_to_ro": {
"early_stopping": true,
"max_length": 300,
"num_beams": 4,
"prefix": "translate English to Romanian: "
}
},
"transformers_version": "4.27.4",
"use_cache": true,
"vit_model": "google/vit-base-patch16-224-in21k",
"vocab_size": 32128
}
3072
64
768
0
relu
0
false
0.1
false
0
1
relu
LABEL_0
LABEL_1
1
false
true
false
0
1
0.000001
1
20
0
t5
512
0
1
1
12
12
12
1
false
false
10m 8s
May 18 '23 08:59
-
eay50jzi
-
Finished
May 18 '23 08:59
50000
fe6d9bf207cd3337512ca838a8b453f87a9178ef
t5-base
false
["T5ForConditionalGeneration"]
0
T5Config {
"_name_or_path": "t5-base",
"architectures": [
"T5ForConditionalGeneration"
],
"d_ff": 3072,
"d_kv": 64,
"d_model": 768,
"decoder_start_token_id": 0,
"dense_act_fn": "relu",
"dropout_rate": 0.1,
"eos_token_id": 1,
"feed_forward_proj": "relu",
"initializer_factor": 1.0,
"is_encoder_decoder": true,
"is_gated_act": false,
"layer_norm_epsilon": 1e-06,
"max_2d_position_embeddings": 1024,
"model_type": "t5",
"n_positions": 512,
"num_decoder_layers": 12,
"num_heads": 12,
"num_layers": 12,
"output_past": true,
"pad_token_id": 0,
"relative_attention_max_distance": 128,
"relative_attention_num_buckets": 32,
"task_specific_params": {
"summarization": {
"early_stopping": true,
"length_penalty": 2.0,
"max_length": 200,
"min_length": 30,
"no_repeat_ngram_size": 3,
"num_beams": 4,
"prefix": "summarize: "
},
"translation_en_to_de": {
"early_stopping": true,
"max_length": 300,
"num_beams": 4,
"prefix": "translate English to German: "
},
"translation_en_to_fr": {
"early_stopping": true,
"max_length": 300,
"num_beams": 4,
"prefix": "translate English to French: "
},
"translation_en_to_ro": {
"early_stopping": true,
"max_length": 300,
"num_beams": 4,
"prefix": "translate English to Romanian: "
}
},
"transformers_version": "4.27.4",
"use_cache": true,
"vit_model": "google/vit-base-patch16-224-in21k",
"vocab_size": 32128
}
3072
64
768
0
relu
0
false
0.1
false
0
1
relu
LABEL_0
LABEL_1
1
false
true
false
0
1
0.000001
1
20
0
t5
512
0
1
1
12
12
12
1
false
false
2m 13s
May 18 '23 08:46
-
0t71stjm
-
Crashed
May 18 '23 08:46
50000
fe6d9bf207cd3337512ca838a8b453f87a9178ef
t5-base
false
["T5ForConditionalGeneration"]
0
T5Config {
"_name_or_path": "t5-base",
"architectures": [
"T5ForConditionalGeneration"
],
"d_ff": 3072,
"d_kv": 64,
"d_model": 768,
"decoder_start_token_id": 0,
"dense_act_fn": "relu",
"dropout_rate": 0.1,
"eos_token_id": 1,
"feed_forward_proj": "relu",
"initializer_factor": 1.0,
"is_encoder_decoder": true,
"is_gated_act": false,
"layer_norm_epsilon": 1e-06,
"max_2d_position_embeddings": 1024,
"model_type": "t5",
"n_positions": 512,
"num_decoder_layers": 12,
"num_heads": 12,
"num_layers": 12,
"output_past": true,
"pad_token_id": 0,
"relative_attention_max_distance": 128,
"relative_attention_num_buckets": 32,
"task_specific_params": {
"summarization": {
"early_stopping": true,
"length_penalty": 2.0,
"max_length": 200,
"min_length": 30,
"no_repeat_ngram_size": 3,
"num_beams": 4,
"prefix": "summarize: "
},
"translation_en_to_de": {
"early_stopping": true,
"max_length": 300,
"num_beams": 4,
"prefix": "translate English to German: "
},
"translation_en_to_fr": {
"early_stopping": true,
"max_length": 300,
"num_beams": 4,
"prefix": "translate English to French: "
},
"translation_en_to_ro": {
"early_stopping": true,
"max_length": 300,
"num_beams": 4,
"prefix": "translate English to Romanian: "
}
},
"transformers_version": "4.27.4",
"use_cache": true,
"vit_model": "google/vit-base-patch16-224-in21k",
"vocab_size": 32128
}
3072
64
768
0
relu
0
false
0.1
false
0
1
relu
LABEL_0
LABEL_1
1
false
true
false
0
1
0.000001
1
20
0
t5
512
0
1
1
12
12
12
1
false
false
59s
May 18 '23 08:42
-
r4yj2nut
-
Crashed
May 18 '23 08:42
50000
fe6d9bf207cd3337512ca838a8b453f87a9178ef
t5-base
false
["T5ForConditionalGeneration"]
0
T5Config {
"_name_or_path": "t5-base",
"architectures": [
"T5ForConditionalGeneration"
],
"d_ff": 3072,
"d_kv": 64,
"d_model": 768,
"decoder_start_token_id": 0,
"dense_act_fn": "relu",
"dropout_rate": 0.1,
"eos_token_id": 1,
"feed_forward_proj": "relu",
"initializer_factor": 1.0,
"is_encoder_decoder": true,
"is_gated_act": false,
"layer_norm_epsilon": 1e-06,
"max_2d_position_embeddings": 1024,
"model_type": "t5",
"n_positions": 512,
"num_decoder_layers": 12,
"num_heads": 12,
"num_layers": 12,
"output_past": true,
"pad_token_id": 0,
"relative_attention_max_distance": 128,
"relative_attention_num_buckets": 32,
"task_specific_params": {
"summarization": {
"early_stopping": true,
"length_penalty": 2.0,
"max_length": 200,
"min_length": 30,
"no_repeat_ngram_size": 3,
"num_beams": 4,
"prefix": "summarize: "
},
"translation_en_to_de": {
"early_stopping": true,
"max_length": 300,
"num_beams": 4,
"prefix": "translate English to German: "
},
"translation_en_to_fr": {
"early_stopping": true,
"max_length": 300,
"num_beams": 4,
"prefix": "translate English to French: "
},
"translation_en_to_ro": {
"early_stopping": true,
"max_length": 300,
"num_beams": 4,
"prefix": "translate English to Romanian: "
}
},
"transformers_version": "4.27.4",
"use_cache": true,
"vit_model": "google/vit-base-patch16-224-in21k",
"vocab_size": 32128
}
3072
64
768
0
relu
0
false
0.1
false
0
1
relu
LABEL_0
LABEL_1
1
false
true
false
0
1
0.000001
1
20
0
t5
512
0
1
1
12
12
12
1
false
false
2m 12s
May 18 '23 08:39
-
6yaahlhl
-
Crashed
May 18 '23 08:39
50000
fe6d9bf207cd3337512ca838a8b453f87a9178ef
t5-base
false
["T5ForConditionalGeneration"]
0
T5Config {
"_name_or_path": "t5-base",
"architectures": [
"T5ForConditionalGeneration"
],
"d_ff": 3072,
"d_kv": 64,
"d_model": 768,
"decoder_start_token_id": 0,
"dense_act_fn": "relu",
"dropout_rate": 0.1,
"eos_token_id": 1,
"feed_forward_proj": "relu",
"initializer_factor": 1.0,
"is_encoder_decoder": true,
"is_gated_act": false,
"layer_norm_epsilon": 1e-06,
"max_2d_position_embeddings": 1024,
"model_type": "t5",
"n_positions": 512,
"num_decoder_layers": 12,
"num_heads": 12,
"num_layers": 12,
"output_past": true,
"pad_token_id": 0,
"relative_attention_max_distance": 128,
"relative_attention_num_buckets": 32,
"task_specific_params": {
"summarization": {
"early_stopping": true,
"length_penalty": 2.0,
"max_length": 200,
"min_length": 30,
"no_repeat_ngram_size": 3,
"num_beams": 4,
"prefix": "summarize: "
},
"translation_en_to_de": {
"early_stopping": true,
"max_length": 300,
"num_beams": 4,
"prefix": "translate English to German: "
},
"translation_en_to_fr": {
"early_stopping": true,
"max_length": 300,
"num_beams": 4,
"prefix": "translate English to French: "
},
"translation_en_to_ro": {
"early_stopping": true,
"max_length": 300,
"num_beams": 4,
"prefix": "translate English to Romanian: "
}
},
"transformers_version": "4.27.4",
"use_cache": true,
"vit_model": "google/vit-base-patch16-224-in21k",
"vocab_size": 32128
}
3072
64
768
0
relu
0
false
0.1
false
0
1
relu
LABEL_0
LABEL_1
1
false
true
false
0
1
0.000001
1
20
0
t5
512
0
1
1
12
12
12
1
false
false
33s
May 18 '23 08:35
-
6efi1ngq
-
Crashed
May 18 '23 08:35
-
fe6d9bf207cd3337512ca838a8b453f87a9178ef
t5-base
false
["T5ForConditionalGeneration"]
0
-
3072
64
768
0
relu
0
false
0.1
false
0
1
relu
LABEL_0
LABEL_1
1
false
true
false
0
1
0.000001
1
20
0
t5
512
0
1
1
12
12
12
1
false
false
1m 55s
May 18 '23 08:35
-
345cj8j3
-
Finished
May 18 '23 08:35
50
fe6d9bf207cd3337512ca838a8b453f87a9178ef
t5-base
false
["T5ForConditionalGeneration"]
0
T5Config {
"_name_or_path": "t5-base",
"architectures": [
"T5ForConditionalGeneration"
],
"d_ff": 3072,
"d_kv": 64,
"d_model": 768,
"decoder_start_token_id": 0,
"dense_act_fn": "relu",
"dropout_rate": 0.1,
"eos_token_id": 1,
"feed_forward_proj": "relu",
"initializer_factor": 1.0,
"is_encoder_decoder": true,
"is_gated_act": false,
"layer_norm_epsilon": 1e-06,
"max_2d_position_embeddings": 1024,
"model_type": "t5",
"n_positions": 512,
"num_decoder_layers": 12,
"num_heads": 12,
"num_layers": 12,
"output_past": true,
"pad_token_id": 0,
"relative_attention_max_distance": 128,
"relative_attention_num_buckets": 32,
"task_specific_params": {
"summarization": {
"early_stopping": true,
"length_penalty": 2.0,
"max_length": 200,
"min_length": 30,
"no_repeat_ngram_size": 3,
"num_beams": 4,
"prefix": "summarize: "
},
"translation_en_to_de": {
"early_stopping": true,
"max_length": 300,
"num_beams": 4,
"prefix": "translate English to German: "
},
"translation_en_to_fr": {
"early_stopping": true,
"max_length": 300,
"num_beams": 4,
"prefix": "translate English to French: "
},
"translation_en_to_ro": {
"early_stopping": true,
"max_length": 300,
"num_beams": 4,
"prefix": "translate English to Romanian: "
}
},
"transformers_version": "4.27.4",
"use_cache": true,
"vit_model": "google/vit-base-patch16-224-in21k",
"vocab_size": 32128
}
3072
64
768
0
relu
0
false
0.1
false
0
1
relu
LABEL_0
LABEL_1
1
false
true
false
0
1
0.000001
1
20
0
t5
512
0
1
1
12
12
12
1
false
false
58s
May 18 '23 08:31
-
xcrd6qyu
-
Crashed
May 18 '23 08:31
100
fe6d9bf207cd3337512ca838a8b453f87a9178ef
t5-base
false
["T5ForConditionalGeneration"]
0
T5Config {
"_name_or_path": "t5-base",
"architectures": [
"T5ForConditionalGeneration"
],
"d_ff": 3072,
"d_kv": 64,
"d_model": 768,
"decoder_start_token_id": 0,
"dense_act_fn": "relu",
"dropout_rate": 0.1,
"eos_token_id": 1,
"feed_forward_proj": "relu",
"initializer_factor": 1.0,
"is_encoder_decoder": true,
"is_gated_act": false,
"layer_norm_epsilon": 1e-06,
"max_2d_position_embeddings": 1024,
"model_type": "t5",
"n_positions": 512,
"num_decoder_layers": 12,
"num_heads": 12,
"num_layers": 12,
"output_past": true,
"pad_token_id": 0,
"relative_attention_max_distance": 128,
"relative_attention_num_buckets": 32,
"task_specific_params": {
"summarization": {
"early_stopping": true,
"length_penalty": 2.0,
"max_length": 200,
"min_length": 30,
"no_repeat_ngram_size": 3,
"num_beams": 4,
"prefix": "summarize: "
},
"translation_en_to_de": {
"early_stopping": true,
"max_length": 300,
"num_beams": 4,
"prefix": "translate English to German: "
},
"translation_en_to_fr": {
"early_stopping": true,
"max_length": 300,
"num_beams": 4,
"prefix": "translate English to French: "
},
"translation_en_to_ro": {
"early_stopping": true,
"max_length": 300,
"num_beams": 4,
"prefix": "translate English to Romanian: "
}
},
"transformers_version": "4.27.4",
"use_cache": true,
"vit_model": "google/vit-base-patch16-224-in21k",
"vocab_size": 32128
}
3072
64
768
0
relu
0
false
0.1
false
0
1
relu
LABEL_0
LABEL_1
1
false
true
false
0
1
0.000001
1
20
0
t5
512
0
1
1
12
12
12
1
false
false
2m 34s
May 18 '23 08:30
-
9pvgsfwe
-
Finished
May 18 '23 08:30
100
fe6d9bf207cd3337512ca838a8b453f87a9178ef
t5-base
false
["T5ForConditionalGeneration"]
0
T5Config {
"_name_or_path": "t5-base",
"architectures": [
"T5ForConditionalGeneration"
],
"d_ff": 3072,
"d_kv": 64,
"d_model": 768,
"decoder_start_token_id": 0,
"dense_act_fn": "relu",
"dropout_rate": 0.1,
"eos_token_id": 1,
"feed_forward_proj": "relu",
"initializer_factor": 1.0,
"is_encoder_decoder": true,
"is_gated_act": false,
"layer_norm_epsilon": 1e-06,
"max_2d_position_embeddings": 1024,
"model_type": "t5",
"n_positions": 512,
"num_decoder_layers": 12,
"num_heads": 12,
"num_layers": 12,
"output_past": true,
"pad_token_id": 0,
"relative_attention_max_distance": 128,
"relative_attention_num_buckets": 32,
"task_specific_params": {
"summarization": {
"early_stopping": true,
"length_penalty": 2.0,
"max_length": 200,
"min_length": 30,
"no_repeat_ngram_size": 3,
"num_beams": 4,
"prefix": "summarize: "
},
"translation_en_to_de": {
"early_stopping": true,
"max_length": 300,
"num_beams": 4,
"prefix": "translate English to German: "
},
"translation_en_to_fr": {
"early_stopping": true,
"max_length": 300,
"num_beams": 4,
"prefix": "translate English to French: "
},
"translation_en_to_ro": {
"early_stopping": true,
"max_length": 300,
"num_beams": 4,
"prefix": "translate English to Romanian: "
}
},
"transformers_version": "4.27.4",
"use_cache": true,
"vit_model": "google/vit-base-patch16-224-in21k",
"vocab_size": 32128
}
3072
64
768
0
relu
0
false
0.1
false
0
1
relu
LABEL_0
LABEL_1
1
false
true
false
0
1
0.000001
1
20
0
t5
512
0
1
1
12
12
12
1
false
false
1m 14s
May 18 '23 08:17
-
7vdnor3k
-
Crashed
May 18 '23 08:17
-
fe6d9bf207cd3337512ca838a8b453f87a9178ef
t5-base
false
["T5ForConditionalGeneration"]
0
-
3072
64
768
0
relu
0
false
0.1
false
0
1
relu
LABEL_0
LABEL_1
1
false
true
false
0
1
0.000001
1
20
0
t5
512
0
1
1
12
12
12
1
false
false
2m 31s
May 18 '23 07:57
-
131bqydp
-
Crashed
May 18 '23 07:57
100
fe6d9bf207cd3337512ca838a8b453f87a9178ef
t5-base
false
["T5ForConditionalGeneration"]
0
T5Config {
"_name_or_path": "t5-base",
"architectures": [
"T5ForConditionalGeneration"
],
"d_ff": 3072,
"d_kv": 64,
"d_model": 768,
"decoder_start_token_id": 0,
"dense_act_fn": "relu",
"dropout_rate": 0.1,
"eos_token_id": 1,
"feed_forward_proj": "relu",
"initializer_factor": 1.0,
"is_encoder_decoder": true,
"is_gated_act": false,
"layer_norm_epsilon": 1e-06,
"max_2d_position_embeddings": 1024,
"model_type": "t5",
"n_positions": 512,
"num_decoder_layers": 12,
"num_heads": 12,
"num_layers": 12,
"output_past": true,
"pad_token_id": 0,
"relative_attention_max_distance": 128,
"relative_attention_num_buckets": 32,
"task_specific_params": {
"summarization": {
"early_stopping": true,
"length_penalty": 2.0,
"max_length": 200,
"min_length": 30,
"no_repeat_ngram_size": 3,
"num_beams": 4,
"prefix": "summarize: "
},
"translation_en_to_de": {
"early_stopping": true,
"max_length": 300,
"num_beams": 4,
"prefix": "translate English to German: "
},
"translation_en_to_fr": {
"early_stopping": true,
"max_length": 300,
"num_beams": 4,
"prefix": "translate English to French: "
},
"translation_en_to_ro": {
"early_stopping": true,
"max_length": 300,
"num_beams": 4,
"prefix": "translate English to Romanian: "
}
},
"transformers_version": "4.27.4",
"use_cache": true,
"vit_model": "google/vit-base-patch16-224-in21k",
"vocab_size": 32128
}
3072
64
768
0
relu
0
false
0.1
false
0
1
relu
LABEL_0
LABEL_1
1
false
true
false
0
1
0.000001
1
20
0
t5
512
0
1
1
12
12
12
1
false
false
33s
May 18 '23 07:53
-
wm5i9mxt
-
Crashed
May 18 '23 07:53
-
fe6d9bf207cd3337512ca838a8b453f87a9178ef
t5-base
false
["T5ForConditionalGeneration"]
0
-
3072
64
768
0
relu
0
false
0.1
false
0
1
relu
LABEL_0
LABEL_1
1
false
true
false
0
1
0.000001
1
20
0
t5
512
0
1
1
12
12
12
1
false
false
4m 15s
May 18 '23 07:53
-
xa63kzdo
-
Finished
May 18 '23 07:53
100
fe6d9bf207cd3337512ca838a8b453f87a9178ef
t5-base
false
["T5ForConditionalGeneration"]
0
T5Config {
"_name_or_path": "t5-base",
"architectures": [
"T5ForConditionalGeneration"
],
"d_ff": 3072,
"d_kv": 64,
"d_model": 768,
"decoder_start_token_id": 0,
"dense_act_fn": "relu",
"dropout_rate": 0.1,
"eos_token_id": 1,
"feed_forward_proj": "relu",
"initializer_factor": 1.0,
"is_encoder_decoder": true,
"is_gated_act": false,
"layer_norm_epsilon": 1e-06,
"max_2d_position_embeddings": 1024,
"model_type": "t5",
"n_positions": 512,
"num_decoder_layers": 12,
"num_heads": 12,
"num_layers": 12,
"output_past": true,
"pad_token_id": 0,
"relative_attention_max_distance": 128,
"relative_attention_num_buckets": 32,
"task_specific_params": {
"summarization": {
"early_stopping": true,
"length_penalty": 2.0,
"max_length": 200,
"min_length": 30,
"no_repeat_ngram_size": 3,
"num_beams": 4,
"prefix": "summarize: "
},
"translation_en_to_de": {
"early_stopping": true,
"max_length": 300,
"num_beams": 4,
"prefix": "translate English to German: "
},
"translation_en_to_fr": {
"early_stopping": true,
"max_length": 300,
"num_beams": 4,
"prefix": "translate English to French: "
},
"translation_en_to_ro": {
"early_stopping": true,
"max_length": 300,
"num_beams": 4,
"prefix": "translate English to Romanian: "
}
},
"transformers_version": "4.27.4",
"use_cache": true,
"vit_model": "google/vit-base-patch16-224-in21k",
"vocab_size": 32128
}
3072
64
768
0
relu
0
false
0.1
false
0
1
relu
LABEL_0
LABEL_1
1
false
true
false
0
1
0.000001
1
20
0
t5
512
0
1
1
12
12
12
1
false
false
4m 19s
May 18 '23 07:48
-
bt2ll6fg
-
Finished
May 18 '23 07:48
100
fe6d9bf207cd3337512ca838a8b453f87a9178ef
t5-base
false
["T5ForConditionalGeneration"]
0
T5Config {
"_name_or_path": "t5-base",
"architectures": [
"T5ForConditionalGeneration"
],
"d_ff": 3072,
"d_kv": 64,
"d_model": 768,
"decoder_start_token_id": 0,
"dense_act_fn": "relu",
"dropout_rate": 0.1,
"eos_token_id": 1,
"feed_forward_proj": "relu",
"initializer_factor": 1.0,
"is_encoder_decoder": true,
"is_gated_act": false,
"layer_norm_epsilon": 1e-06,
"max_2d_position_embeddings": 1024,
"model_type": "t5",
"n_positions": 512,
"num_decoder_layers": 12,
"num_heads": 12,
"num_layers": 12,
"output_past": true,
"pad_token_id": 0,
"relative_attention_max_distance": 128,
"relative_attention_num_buckets": 32,
"task_specific_params": {
"summarization": {
"early_stopping": true,
"length_penalty": 2.0,
"max_length": 200,
"min_length": 30,
"no_repeat_ngram_size": 3,
"num_beams": 4,
"prefix": "summarize: "
},
"translation_en_to_de": {
"early_stopping": true,
"max_length": 300,
"num_beams": 4,
"prefix": "translate English to German: "
},
"translation_en_to_fr": {
"early_stopping": true,
"max_length": 300,
"num_beams": 4,
"prefix": "translate English to French: "
},
"translation_en_to_ro": {
"early_stopping": true,
"max_length": 300,
"num_beams": 4,
"prefix": "translate English to Romanian: "
}
},
"transformers_version": "4.27.4",
"use_cache": true,
"vit_model": "google/vit-base-patch16-224-in21k",
"vocab_size": 32128
}
3072
64
768
0
relu
0
false
0.1
false
0
1
relu
LABEL_0
LABEL_1
1
false
true
false
0
1
0.000001
1
20
0
t5
512
0
1
1
12
12
12
1
false
false
1-20
of 45